This is an R Markdown Notebook. When you execute code within the notebook, the results appear beneath the code.
Try executing this chunk by clicking the Run button within the chunk or by placing your cursor inside it and pressing Cmd+Shift+Enter.
library(rjson)
library(dplyr)
jobs_2020 = fromJSON(file = "indeed_job_descs_2020_09_20.json")
jobs_2021 = fromJSON(file = "indeed_job_descs_2021_01_25.json")
This first code block works
jobs_df = data.frame("Job", "State", "Employment",
"description", 2020)
names(jobs_df) = c("Job","State","Employment", "Description", "Year")
for(i in 1:length(jobs_2020)) {
job = jobs_2020[[i]]$request_params[1]
state = jobs_2020[[i]]$request_params[2]
employment = jobs_2020[[i]]$request_params[3]
year = 2020
#print(i)
for(j in 1:length(jobs_2020[[i]]$job_descriptions)) {
descript = jobs_2020[[i]]$job_descriptions[j]
temp_df = as.data.frame(c(job,state,employment, descript, year))
names(temp_df) = c("Job","State","Employment", "Description", "Year")
jobs_df = rbind(jobs_df, temp_df)
#print(j)
}
}
head(jobs_df)
dim(jobs_df)
There is no data for anything past the 4th description
#split dataframe into new dataframes based on job description
library(dplyr)
master_df <- jobs_df %>%
group_by(Job)
group_split(master_df)
<list_of<
tbl_df<
Job : character
State : character
Employment : character
Description: character
Year : double
>
>[16]>
[[1]]
[[2]]
[[3]]
[[4]]
[[5]]
[[6]]
[[7]]
[[8]]
[[9]]
[[10]]
[[11]]
[[12]]
[[13]]
[[14]]
[[15]]
[[16]]
group_keys(master_df)
LS0tDQp0aXRsZTogIlIgTm90ZWJvb2siDQpvdXRwdXQ6IGh0bWxfbm90ZWJvb2sNCi0tLQ0KDQpUaGlzIGlzIGFuIFtSIE1hcmtkb3duXShodHRwOi8vcm1hcmtkb3duLnJzdHVkaW8uY29tKSBOb3RlYm9vay4gV2hlbiB5b3UgZXhlY3V0ZSBjb2RlIHdpdGhpbiB0aGUgbm90ZWJvb2ssIHRoZSByZXN1bHRzIGFwcGVhciBiZW5lYXRoIHRoZSBjb2RlLiANCg0KVHJ5IGV4ZWN1dGluZyB0aGlzIGNodW5rIGJ5IGNsaWNraW5nIHRoZSAqUnVuKiBidXR0b24gd2l0aGluIHRoZSBjaHVuayBvciBieSBwbGFjaW5nIHlvdXIgY3Vyc29yIGluc2lkZSBpdCBhbmQgcHJlc3NpbmcgKkNtZCtTaGlmdCtFbnRlciouIA0KDQpgYGB7cn0NCmxpYnJhcnkocmpzb24pDQpsaWJyYXJ5KGRwbHlyKQ0KDQpqb2JzXzIwMjAgPSBmcm9tSlNPTihmaWxlID0gImluZGVlZF9qb2JfZGVzY3NfMjAyMF8wOV8yMC5qc29uIikNCmpvYnNfMjAyMSA9IGZyb21KU09OKGZpbGUgPSAiaW5kZWVkX2pvYl9kZXNjc18yMDIxXzAxXzI1Lmpzb24iKQ0KYGBgDQoNCg0KVGhpcyBmaXJzdCBjb2RlIGJsb2NrIHdvcmtzDQpgYGB7cn0NCmpvYnNfZGYgPSBkYXRhLmZyYW1lKCJKb2IiLCAiU3RhdGUiLCAiRW1wbG95bWVudCIsIA0KICAgICAgICAgICAgICAgICAgICAgImRlc2NyaXB0aW9uIiwgMjAyMCkNCg0KbmFtZXMoam9ic19kZikgPSBjKCJKb2IiLCJTdGF0ZSIsIkVtcGxveW1lbnQiLCAiRGVzY3JpcHRpb24iLCAiWWVhciIpDQoNCmZvcihpIGluIDE6bGVuZ3RoKGpvYnNfMjAyMCkpIHsNCiAgam9iID0gam9ic18yMDIwW1tpXV0kcmVxdWVzdF9wYXJhbXNbMV0NCiAgc3RhdGUgPSBqb2JzXzIwMjBbW2ldXSRyZXF1ZXN0X3BhcmFtc1syXQ0KICBlbXBsb3ltZW50ID0gam9ic18yMDIwW1tpXV0kcmVxdWVzdF9wYXJhbXNbM10NCiAgeWVhciA9IDIwMjANCiAgDQogICNwcmludChpKQ0KICANCiAgZm9yKGogaW4gMTpsZW5ndGgoam9ic18yMDIwW1tpXV0kam9iX2Rlc2NyaXB0aW9ucykpIHsNCiAgICBkZXNjcmlwdCA9IGpvYnNfMjAyMFtbaV1dJGpvYl9kZXNjcmlwdGlvbnNbal0NCiAgICB0ZW1wX2RmID0gYXMuZGF0YS5mcmFtZShjKGpvYixzdGF0ZSxlbXBsb3ltZW50LCBkZXNjcmlwdCwgeWVhcikpDQogICAgbmFtZXModGVtcF9kZikgPSBjKCJKb2IiLCJTdGF0ZSIsIkVtcGxveW1lbnQiLCAiRGVzY3JpcHRpb24iLCAiWWVhciIpDQogICAgam9ic19kZiA9IHJiaW5kKGpvYnNfZGYsIHRlbXBfZGYpDQogICAgI3ByaW50KGopDQogIH0NCn0NCg0KDQpoZWFkKGpvYnNfZGYpDQpkaW0oam9ic19kZikNCmBgYA0KVGhlcmUgaXMgbm8gZGF0YSBmb3IgYW55dGhpbmcgcGFzdCB0aGUgNHRoIGRlc2NyaXB0aW9uDQpgYGB7cn0NCmZvcihpIGluIDE6NCkgew0KICBqb2IgPSBqb2JzXzIwMjFbW2ldXSRyZXF1ZXN0X3BhcmFtc1sxXQ0KICBzdGF0ZSA9IGpvYnNfMjAyMVtbaV1dJHJlcXVlc3RfcGFyYW1zWzJdDQogIGVtcGxveW1lbnQgPSBqb2JzXzIwMjFbW2ldXSRyZXF1ZXN0X3BhcmFtc1szXQ0KICB5ZWFyID0gMjAyMQ0KICANCiAgcHJpbnQoaSkNCiAgDQogIGZvcihqIGluIDE6bGVuZ3RoKGpvYnNfMjAyMVtbaV1dJGpvYl9kZXNjcmlwdGlvbnMpKSB7DQogICAgZGVzY3JpcHQgPSBqb2JzXzIwMjFbW2ldXSRqb2JfZGVzY3JpcHRpb25zW2pdDQogICAgdGVtcF9kZiA9IGFzLmRhdGEuZnJhbWUoYyhqb2Isc3RhdGUsZW1wbG95bWVudCwgZGVzY3JpcHQsIHllYXIpKQ0KICAgIG5hbWVzKHRlbXBfZGYpID0gYygiSm9iIiwiU3RhdGUiLCJFbXBsb3ltZW50IiwgIkRlc2NyaXB0aW9uIiwgIlllYXIiKQ0KICAgIGpvYnNfZGYgPSByYmluZChqb2JzX2RmLCB0ZW1wX2RmKQ0KICAgIHByaW50KGopDQogIH0NCn0NCg0KI2pvYnNfMjAyMQ0KDQpoZWFkKGpvYnNfZGYpDQpkaW0oam9ic19kZikNCg0KI3JlbW92ZSB0aGUgZmlyc3Qgcm93IGJlY2F1c2UgaXQgaXMgdXNlbGVzcw0Kam9ic19kZiA8LSBqb2JzX2RmWy0xLF0NCmBgYA0KDQoNCmBgYHtyfQ0KI3NwbGl0IGRhdGFmcmFtZSBpbnRvIG5ldyBkYXRhZnJhbWVzIGJhc2VkIG9uIGpvYiBkZXNjcmlwdGlvbg0KbGlicmFyeShkcGx5cikNCm1hc3Rlcl9kZiA8LSBqb2JzX2RmICU+JQ0KICBncm91cF9ieShKb2IpDQoNCmdyb3VwX3NwbGl0KG1hc3Rlcl9kZikNCmdyb3VwX2tleXMobWFzdGVyX2RmKQ0KDQoNCg0KYGBgDQo=